Skip to content

Instantly share code, notes, and snippets.

View chapmanjacobd's full-sized avatar
🥅
goal_net

Jacob Chapman chapmanjacobd

🥅
goal_net
View GitHub Profile
@chapmanjacobd
chapmanjacobd / titles.nd.js
Created May 6, 2024 15:06
Copy all titles from reddit page
Array.from(document.querySelectorAll('.title')).map(e => e.innerText).join('\n');

Have you ever wanted to do:

SELECT * FROM www.google.com

With BigQuery you kind of can. But have you ever wanted to do:

SELECT * FROM www.wikipedia.com

With Wikidata Query Service you kind of can (semantic web!, RDF!?, https://www.w3.org/wiki/SparqlImplementations).

class HtmlList:
def __init__(self):
self.tree = []
self.xpath = []
def resolve_parents(self, el) -> list:
if el.parent is None:
return self.xpath
else:
import argparse, re, webbrowser
from xklb.utils import web
def search_art(term):
search_url = f"https://artsandculture.google.com/search?q={term.replace(' ', '+')}"
response = web.requests_session().get(search_url)
if response.status_code == 200:
@chapmanjacobd
chapmanjacobd / eda sqlite example
Created March 24, 2024 16:22
lb eda temp.db -L inf
$ lb eda temp.db -L inf
## temp.db:playlists
### Shape
(1, 8)
### Sample of rows
| | id | time_modified | time_deleted | extractor_config | extractor_key | path | time_created | hours_update_delay |
def cover_scan(media_duration, scan_percentage):
num_scans = max(2, int(math.log(media_duration) * (scan_percentage / 10)))
scan_duration_total = max(1, media_duration * (scan_percentage / 100))
scan_duration = max(1, int(scan_duration_total / num_scans))
scan_interval = media_duration / num_scans
scans = sorted(set(int(scan * scan_interval) for scan in range(num_scans)))
if scans[-1] < media_duration - (scan_duration * 2):
scans.append(math.floor(media_duration - scan_duration))
def get_file_part(file_path, specifier):
size = file_path.stat().st_size
if specifier.isdigit():
specifier = int(specifier)
if specifier > 0:
with file_path.open('rb') as file:
return file.read(specifier)
else:
def compare_stats(destination_files, destination_folders, source_files, source_empty_folders):
new_empty_folders = source_empty_folders - destination_folders
source_dirs = {p.parent for p in source_files}
destination_dirs = {p.parent for p in destination_files}
new_directories = source_dirs - destination_dirs
new_files = source_files - destination_files
replaced_files = source_files & destination_files
trumped_files = replaced_files.intersection(source_files | destination_files)
class FFProbe:
def __init__(self, path, *args):
args = ["ffprobe", "-show_format", "-show_streams", "-show_chapters", "-of", "json", *args, path]
p = subprocess.Popen(args, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
out, err = p.communicate()
if p.returncode != 0:
raise RuntimeError(out, err)
d = json.loads(out.decode("utf-8"))
kern :info : [ +0.000006] BTRFS info (device sde: state A): dumping space info:
kern :info : [ +0.000006] BTRFS info (device sde: state A): space_info DATA has 142864384 free, is not full
kern :info : [ +0.000006] BTRFS info (device sde: state A): space_info total=9971804340224, used=9688658702336, pinned=283002445824, reserved=0, may_use=0, readonly=327680 zone_unusable=0
kern :info : [ +0.000009] BTRFS info (device sde: state A): space_info METADATA has 0 free, is full
kern :info : [ +0.000005] BTRFS info (device sde: state A): space_info total=15032385536, used=14061862912, pinned=329777152, reserved=640679936, may_use=0, readonly