Skip to content

Instantly share code, notes, and snippets.

import requests
from bs4 import BeautifulSoup
def make_soup(url):
response = requests.get(website)
return BeautifulSoup(response.text)
def initial_links(website):
soup = make_soup(website)
import os
dest = 'apache-hive-0.14.0-bin.tar.gz'
print os.stat(dest).st_size
hadoop fs -rmr ./AAA_AnnualReview
hadoop fs -rmr ./AAA_Employee
hadoop fs -rmr ./tbl_Underwriting_Extract
sqoop import --driver com.microsoft.sqlserver.jdbc.SQLServerDriver --connect 'jdbc:sqlserver://sa3sql500:51433;database=BigData' --table AAA_AnnualReview --username BigData_ETL_User --password BigData_ETL_User -m 1
import math
import string
from nltk.corpus import stopwords
from pyspark.sql.functions import udf
from pyspark.sql.types import *
def question_headline( headline):
keywords = ['?', 'should', 'can', 'if', 'is', 'would', 'why', 'how', 'when', "where"]
if any(word in headline for word in keywords):
return 1
from faker import Faker
fake = Faker()
outfile = 'data.csv'
outsize = 1024 * 1024 * 1024 # 1GB
with open(outfile, 'w') as csvfile:
size = 0
while size < outsize:
txt = '%s, %s\n' % (fake.name(), fake.address())
from faker import Faker
import datetime
import random
import sys
import csv
fake = Faker()
outfile = 'data_test.csv'
from faker import Faker
import datetime
import random
import sys
import csv
startTime = datetime.datetime.now()
fake = Faker()
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
package adwords_crm;
import com.google.api.ads.adwords.axis.factory.AdWordsServices;
import com.google.api.ads.adwords.axis.v201605.cm.CampaignCriterion;
import com.google.api.ads.adwords.axis.v201609.cm.AdGroupCriterionOperation;
import com.google.api.ads.adwords.axis.v201609.cm.AdGroupCriterionReturnValue;
import com.google.api.ads.adwords.axis.v201609.cm.AdGroupCriterionServiceInterface;
import com.google.api.ads.adwords.axis.v201609.cm.AdGroupServiceInterface;
import com.google.api.ads.adwords.axis.v201609.cm.ApiException;
import com.google.api.ads.adwords.axis.v201609.cm.BiddableAdGroupCriterion;
package adwords_crm;
import com.google.api.ads.adwords.axis.factory.AdWordsServices;
import com.google.api.ads.adwords.axis.v201609.cm.CampaignCriterion;
import com.google.api.ads.adwords.axis.v201609.cm.AdGroupCriterionOperation;
import com.google.api.ads.adwords.axis.v201609.cm.AdGroupCriterionReturnValue;
import com.google.api.ads.adwords.axis.v201609.cm.AdGroupCriterionServiceInterface;
import com.google.api.ads.adwords.axis.v201609.cm.AdGroupServiceInterface;
import com.google.api.ads.adwords.axis.v201609.cm.ApiException;
import com.google.api.ads.adwords.axis.v201609.cm.BiddableAdGroupCriterion;