Jiawei Li iewaij

## spark.py
from pyspark.sql import *
import matplotlib.pyplot as pyplot
import seaborn as sns
import pandas as pd

spark = SparkSession.builder.master("local[*]").appName("MADS 2020").getOrCreate()
data = spark.read.csv("data/machine_log.csv", inferSchema="True", header="True", sep=";")
data_sample = data.sample(fraction=0.1, seed=42)

# some compound have less produced units

## timing.ipynb

      
        
          
            
              
              1 file
            
          
          
            
              
              0 forks
            
          
          
            
              
              0 comments
            
          
          
            
              
              0 stars
            
          
        
        
          
              
          
          
            
                iewaij
                / timing.ipynb
            
            
              Created
              June 23, 2018 00:50
            
          
        
      
        
  
    
    

          
    
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
	from pyspark.sql import *
	import matplotlib.pyplot as pyplot
	import seaborn as sns
	import pandas as pd

	spark = SparkSession.builder.master("local[*]").appName("MADS 2020").getOrCreate()
	data = spark.read.csv("data/machine_log.csv", inferSchema="True", header="True", sep=";")
	data_sample = data.sample(fraction=0.1, seed=42)

	# some compound have less produced units