Each of these commands will run an ad hoc http static server in your current (or specified) directory, available at http://localhost:8000. Use this power wisely.
$ python -m SimpleHTTPServer 8000
from deltalake import DeltaTable | |
dt = DeltaTable( | |
# Change this to your unique URI from a previous step | |
# if you’re using your own AWS credentials. | |
's3://mage-demo-public/magic-energy-and-battle-history/1337', | |
storage_options={ | |
'AWS_ACCESS_KEY_ID': '...', | |
'AWS_SECRET_ACCESS_KEY': '...', |
from deltalake.writer import write_deltalake | |
@data_exporter | |
def export_data(combined_data, *args, **kwargs): | |
write_deltalake( | |
# Change this URI to your own unique URI | |
's3://mage-demo-public/magic-energy-and-battle-history/1337', | |
data=combined_data, | |
mode='overwrite', |
from deltalake import DeltaTable | |
dt = DeltaTable( | |
# Change this to your unique URI from a previous step | |
# if you’re using your own AWS credentials. | |
's3://mage-demo-public/battle-history-versioned/1337', | |
storage_options={ | |
'AWS_ACCESS_KEY_ID': '...', | |
'AWS_SECRET_ACCESS_KEY': '...', |
from deltalake.writer import write_deltalake | |
# ['Aiur', 'Eos', 'Gaia', 'Kamigawa', 'Korhal', 'Ravnica'] | |
planets = list(sorted(set(df['planet'].values))) | |
# Loop through each planet | |
for planet in planets: | |
# Select a subset of the battle history data for a single planet | |
planet_df = df.query(f"`planet` == '{planet}'") |
from deltalake.writer import write_deltalake | |
write_deltalake( | |
# Change this URI to your own unique URI | |
's3://mage-demo-public/battle-history/1337', | |
data=df, | |
mode='overwrite', | |
overwrite_schema=True, | |
storage_options={ |
from deltalake import DeltaTable | |
import pandas as pd | |
@transformer | |
def transform(magic_energy, *args, **kwargs): | |
dt = DeltaTable( | |
# Change this to your unique URI from a previous step | |
# if you’re using your own AWS credentials. | |
's3://mage-demo-public/battle-history/1337', |
from deltalake import DeltaTable | |
dt = DeltaTable( | |
# Change this to your unique URI from a previous step | |
# if you’re using your own AWS credentials. | |
's3://mage-demo-public/battle-history/1337', | |
storage_options={ | |
'AWS_ACCESS_KEY_ID': '...', | |
'AWS_SECRET_ACCESS_KEY': '...', |
from deltalake import DeltaTable | |
@data_loader | |
def load_data(*args, **kwargs): | |
dt = DeltaTable( | |
's3://mage-demo-public/magic-energy/1337', | |
storage_options={ | |
'AWS_ACCESS_KEY_ID': '...', | |
'AWS_SECRET_ACCESS_KEY': '...', |
Each of these commands will run an ad hoc http static server in your current (or specified) directory, available at http://localhost:8000. Use this power wisely.
$ python -m SimpleHTTPServer 8000
import pandas as pd | |
df = pd.read_csv( | |
'https://raw.githubusercontent.com/mage-ai/datasets/master/battle_history.csv', | |
) |