Skip to content

Instantly share code, notes, and snippets.

View Hosuke's full-sized avatar
🐢
I code slowly

Huang Geyang Hosuke

🐢
I code slowly
View GitHub Profile
@Hosuke
Hosuke / csv2trinosql.py
Created January 9, 2024 10:39
csv to trino static query
import pandas as pd
if __name__ == '__main__':
# Reload the CSV file due to code execution state reset
file_path = '01HKPMHCEM0TFYD6KNPM66XHTT.csv'
df = pd.read_csv(file_path)
# Construct the SQL query in the desired format with dynamic field names
sql_query = "SELECT "
@Hosuke
Hosuke / seed_gen.py
Last active November 15, 2023 14:10
import pandas as pd
import yaml
# 读取CSV文件
df = pd.read_csv('dex_base_trades_seed.csv')
# 初始化schema字典
schema = {
"version": 2,
"seeds": []
import os
import re
# Get the current working directory
directory = os.getcwd()
# Iterate over all files in the directory and its subdirectories
for dirpath, dirnames, filenames in os.walk(directory):
for filename in filenames:
# Process only files with a .sql extension
import os
import re
# 获取当前工作目录
directory = os.getcwd()
# 定义日期的正则表达式
date_pattern = r"'((19|20)\d\d[-](0[1-9]|1[012])[-](0[1-9]|[12][0-9]|3[01]))'"
# 遍历目录及其所有子目录下的所有文件
import os
import re
# 获取当前工作目录
directory = os.getcwd()
# 遍历目录及其所有子目录下的所有文件
for dirpath, dirnames, filenames in os.walk(directory):
for filename in filenames:
# 只处理.sql文件
import os
import re
# 获取当前工作目录
directory = os.getcwd()
# 遍历目录及其所有子目录下的所有文件
for dirpath, dirnames, filenames in os.walk(directory):
for filename in filenames:
# 只处理.sql文件
import json
def get_model_dependencies(manifest_file, model_name):
with open(manifest_file, 'r') as f:
manifest = json.load(f)
# Build the adjacency list
adj_list = {}
for full_model_name, model in manifest['nodes'].items():
if not full_model_name.startswith('model.'):
import json
def get_model_dependencies(manifest_file, model_name):
with open(manifest_file, 'r') as f:
manifest = json.load(f)
def get_dependencies(full_model_name, indent=0):
if full_model_name.startswith('model.'):
model = manifest['nodes'].get(full_model_name)
if model is None:
import os
import re
import shutil
# Get current dir
dir_path = os.getcwd()
for root, dirs, files in os.walk(dir_path):
for file in files:
@Hosuke
Hosuke / trino_spells_mover.py
Last active July 11, 2023 05:58
trino_spells_mover
import os
import re
import shutil
def replace_with_alias_macros(model_contents):
"""
Replace alias = 'some_alias' with alias('some_alias', legacy_model=True)
"""
pattern = r"alias\s*=\s*'([^']*)'"
# replace alias with legacy alias