Nov05

## selenium.py
# install chromium, its driver, and selenium
!apt install chromium-chromedriver
!cp /usr/lib/chromium-browser/chromedriver /usr/bin
!pip install selenium
# set options to be headless, ..
from selenium import webdriver
options = webdriver.ChromeOptions()
options.add_argument('--headless')
options.add_argument('--no-sandbox')
options.add_argument('--disable-dev-shm-usage')

## 2019-08-02 Check Heroku Logs and Debug.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                Nov05
                / 2019-08-02 Check Heroku Logs and Debug.md
            
            
              Last active
              August 3, 2019 03:47
            
          
    2019-08-01
Check Heroku Logs and Debug

Dash App on Heroku

https://hours-estimate.herokuapp.com/

GitHub Repo

https://github.com/Nov05/DS-Unit-2-Sprint-4-Project

navigate: Heroku > hours-estimate (or your own app name) > Activity > View build log


## 2019-08-05 anaconda.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                Nov05
                / 2019-08-05 anaconda.md
            
            
              Last active
              August 5, 2019 18:50
            
          
    2019-08-05

Anaconda Logs
Unit 3 Module 1 Python Packages and Environments

https://github.com/Nov05/DS-Unit-3-Sprint-1-Software-Engineering/tree/master/module1-python-modules-packages-and-environments
Managing Environments (Anaconda)

https://docs.conda.io/projects/conda/en/latest/user-guide/tasks/manage-environments.html
Windows 10, Anaconda Prompt

  
## 2019-10-20 fireball.md

      
              1 file
            
          
              0 forks
            
          
              1 comment
            
          
              0 stars
            
          
                Nov05
                / 2019-10-20 fireball.md
            
            
              Last active
              October 20, 2019 09:09
            
          
    import pandas as pd
import numpy as np

import matplotlib.pyplot as plt
import seaborn as sns
import pandas_profiling
import plotly
import plotly.graph_objects as go
from sklearn.preprocessing import MinMaxScaler


## 2019-10-20 custom colorscale.md

      
              1 file
            
          
              0 forks
            
          
              1 comment
            
          
              0 stars
            
          
                Nov05
                / 2019-10-20 custom colorscale.md
            
            
              Created
              October 20, 2019 09:55
            
          
    !pip install colorlover
# Successfully installed colorlover-0.3.0

import pandas as pd
import numpy as np

import matplotlib.pyplot as plt


## 2019-10-20 random forest.md

      
              1 file
            
          
              0 forks
            
          
              1 comment
            
          
              0 stars
            
          
                Nov05
                / 2019-10-20 random forest.md
            
            
              Last active
              October 21, 2019 21:14
            
          
    Baseline

# baseline score
X_train, X_val, y_train, y_val = train_test_split(
    X_trainval, y_trainval, test_size=0.33, random_state=42)
print("train mean velocity:", y_train.mean())
y_val_pred = [y_train.mean()] * len(y_val)
print('baseline error score:', mean_squared_error(y_val, y_val_pred))


## json_to_csv.py
'''
Load Yelp JSON files and spit out CSV files
Does not try to reinvent the wheel and uses pandas json_normalize
Kinda hacky and requires a bit of RAM. But works, albeit naively.

Tested with Yelp JSON files in dataset challenge round 12:
https://www.yelp.com/dataset/challenge
'''

import json

## 2020-02-29 python code snippet.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                Nov05
                / 2020-02-29 python code snippet.md
            
            
              Last active
              February 29, 2020 18:07
            
          
    Find the elements that appear in both lists.
import time
with open('names_1.txt', 'r') as f:
    names_1 = f.read().split("\n")  # List containing 10000 names
with open('names_2.txt', 'r') as f:
    names_2 = f.read().split("\n")  # List containing 10000 names


## model.py
import torch
import torch.nn as nn
import torch.nn.functional as F
import torchvision.models as models


class EncoderCNN(nn.Module):
    def __init__(self, embed_size):
        # super(EncoderCNN, self).__init__()
        super().__init__()

## 20230509 panda express sales data on a receipt
Time,Cnt,Sales,%Sales
10:00AM-10:30AM,7,"$108.60",0.2
10:30AM-11:00AM,62,"$970.59",1.84
11:00AM-11:30AM,102,"$1,399.29",2.66
11:30AM-12:00PM,174,"$2,592.46",4.94
12:00PM-12:30PM,210,"$2,847.98",5.42
12:30PM-1:00PM,189,"$2,609.96",4.97
1:00PM-1:30PM,163,"$2,388.46",4.55
1:30PM-2:00PM,168,"$2,222.29",4.23
2:00PM-2:30PM,104,"$1,430.59",2.72
	# install chromium, its driver, and selenium
	!apt install chromium-chromedriver
	!cp /usr/lib/chromium-browser/chromedriver /usr/bin
	!pip install selenium
	# set options to be headless, ..
	from selenium import webdriver
	options = webdriver.ChromeOptions()
	options.add_argument('--headless')
	options.add_argument('--no-sandbox')
	options.add_argument('--disable-dev-shm-usage')
	'''
	Load Yelp JSON files and spit out CSV files
	Does not try to reinvent the wheel and uses pandas json_normalize
	Kinda hacky and requires a bit of RAM. But works, albeit naively.

	Tested with Yelp JSON files in dataset challenge round 12:
	https://www.yelp.com/dataset/challenge
	'''

	import json
	import torch
	import torch.nn as nn
	import torch.nn.functional as F
	import torchvision.models as models


	class EncoderCNN(nn.Module):
	def __init__(self, embed_size):
	# super(EncoderCNN, self).__init__()
	super().__init__()
	Time,Cnt,Sales,%Sales
	10:00AM-10:30AM,7,"$108.60",0.2
	10:30AM-11:00AM,62,"$970.59",1.84
	11:00AM-11:30AM,102,"$1,399.29",2.66
	11:30AM-12:00PM,174,"$2,592.46",4.94
	12:00PM-12:30PM,210,"$2,847.98",5.42
	12:30PM-1:00PM,189,"$2,609.96",4.97
	1:00PM-1:30PM,163,"$2,388.46",4.55
	1:30PM-2:00PM,168,"$2,222.29",4.23
	2:00PM-2:30PM,104,"$1,430.59",2.72